from gptqmodel import GPTQModel

model = GPTQModel.load("./Qwen3-0.6B-gptqmodel-4bit")
result = model.generate("Uncovering deep insights begins with")[0] # tokens
print(model.tokenizer.decode(result)) # string output